
test_envs = {
    "DEVICE_RESERVE_MEMORY_BYTES": "512000000",  # 512MB
    "LOAD_PYTHON_MODEL": "1",
}

py_test (
    name = "qwen3_test",
    srcs = ["qwen3_test.py"],
    deps = [
        "//rtp_llm/models_py/standalone:rtp_auto_model",
    ],
    env = test_envs,
    tags = ["H20"],
    exec_properties = {'gpu':'H20'},
)

